
# @package _global_
dataset:
  max_number: -1

model:
  multi:
    optimizer:
      learning_rate: 0.01
    batch_size: 64
    seq_hidden_units: 24
    br_size: 88
    fc_hidden_units: 44
    dropout_rate: 0.1
    num_layer: 1
    num_heads: 3

    self_positional_encoding:
      max_relative_position: 20

exp:
  weights_ema: True
  alpha: 0.01
  beta: 0.99
  balancing: domain_confusion
  max_epochs: 200
  early_stopping: True
  early_stopping_patience: 20
